#在NAVIFREQ_ALL_CLASSIFY_WORLDWEB.sh中已经跑完HDFSToJson
#将田老师给的gbk格式的REC文件转成utf-8格式的,并将所有数据合并为一行,存在hdfs中
#/tmp/InternationalData_source/domain_code_belongs_continent3.txt
spark-submit \
--master yarn \
--deploy-mode cluster \
--num-executors 8 \
--executor-memory 11G \
--driver-memory 2G \
--executor-cores 3 \
--conf spark.network.timeout=10000000 \
--conf spark.yarn.preserve.staging.files=true \
--class com.cnki.result_transform.CSYD_TABLEMETA_WORLD \
/data/yzw/original-makeChange-1.0-SNAPSHOT.jar


spark-submit \
--master yarn \
--deploy-mode cluster \
--num-executors 8 \
--executor-memory 11G \
--driver-memory 2G \
--executor-cores 3 \
--conf spark.network.timeout=10000000 \
--conf spark.yarn.preserve.staging.files=true \
--class com.cnki.result_transform.CSYD_TABLEMETA_WORLDJsonToREC \
/data/yzw/original-makeChange-1.0-SNAPSHOT.jar